import json
import pandas as pd
import matplotlib.pyplot as plt

dom_df = pd.read_csv("../../src/extracted/DESED_FSD50K_domestic_sounds.csv")
lm_df = pd.read_csv("../../src/extracted/DESED_FSD50K_label_mapping_non_single_speech.csv")

dup = len(set(dom_df["fname"]).intersection(set(lm_df["fname"])))
print(f"Number of label_mapping: {len(lm_df)}") # 1989
print(f"Number of duplicated files: {dup} out of {len(dom_df)}") # 1653; 8009